applications:
- name: ray-llm
  route_prefix: /
  import_path: rayllm.backend:router_application
  args:
    models:
      - "./models/continuous_batching/quantization/TheBloke--Llama-2-70B-chat-AWQ.yaml"